#1. Env prepare
import pandas as pd
import seaborn as sns


# 2. Read and prepare data
SQLite_data = pd.read_csv('report_SQLite.csv')
SQLite_data['source'] = 'SQLite'
SQLite_data.head()


MSSQL_data = pd.read_csv('report_MSSQL.csv')
MSSQL_data['source'] = 'MSSQL'
MSSQL_data.head()


merged_df = pd.concat([SQLite_data.loc[:, ~SQLite_data.columns.isin(['file_size(KB)'])], MSSQL_data])
merged_df = merged_df.loc[merged_df['time_diff'] < 300] #this step is needed to remove outliers
merged_df_INSERT = merged_df.loc[merged_df['operation'] == 'INSERT']
merged_df_SELECT = merged_df.loc[merged_df['operation'] == 'SELECT']


# 3. Results
# Plot the lines on two facets, source https://seaborn.pydata.org/examples/faceted_lineplot.html 
sns.relplot(
    data=merged_df_INSERT,
    x="inserted_rows", 
    y="time_diff", 
    col="source",
    kind="line", 
    hue="cols",
    height=5,
    aspect=.75, 
    facet_kws=dict(sharex=False), 
    alpha = 0.6
)

<seaborn.axisgrid.FacetGrid at 0x25d0a8632b0>


sns.relplot(
    data=merged_df_SELECT,
    x="rows", 
    y="time_diff", 
    col="source",
    kind="line", 
    hue="cols",
    height=5, 
    aspect=.75, 
    facet_kws=dict(sharex=False), 
    alpha = 0.6
).set_xticklabels(['','0', '20K', '40K', '60K', '80K', '100K', '120K', ''],rotation=30)

<seaborn.axisgrid.FacetGrid at 0x25d0a863e80>

	cols	rows	inserted_rows	start_op	end_op	time_diff	operation	file_size(KB)	source
0	1	100	100	2022-07-31 18:03:56.346697	2022-07-31 18:04:00.048014	3.701317	INSERT	160.0	SQLite
1	1	100	100	2022-07-31 18:04:00.063387	2022-07-31 18:04:00.063387	0.000000	SELECT	160.0	SQLite
2	1	300	200	2022-07-31 18:04:00.063387	2022-07-31 18:04:07.452064	7.388677	INSERT	160.0	SQLite
3	1	300	200	2022-07-31 18:04:07.452064	2022-07-31 18:04:07.467377	0.015313	SELECT	160.0	SQLite
4	1	600	300	2022-07-31 18:04:07.467377	2022-07-31 18:04:18.789870	11.322493	INSERT	160.0	SQLite

SQL Stress Testing.¶

Introduction.¶

Hardware / Software Specs.¶

Python 3 Scripts.¶

Limitations.¶

Performance Analysis.¶

INSERT Statement.¶

SELECT Statement¶

Conclusions¶

References¶

	cols	rows	inserted_rows	start_op	end_op	time_diff	operation	source
0	1	100	100	2023-02-03 07:42:02.832929	2023-02-03 07:42:02.838674	0.005745	INSERT	MSSQL
1	1	100	100	2023-02-03 07:42:02.853426	2023-02-03 07:42:02.853426	0.000000	SELECT	MSSQL
2	1	300	200	2023-02-03 07:42:02.855421	2023-02-03 07:42:02.865166	0.009745	INSERT	MSSQL
3	1	300	200	2023-02-03 07:42:02.866132	2023-02-03 07:42:02.867129	0.000997	SELECT	MSSQL
4	1	600	300	2023-02-03 07:42:02.868158	2023-02-03 07:42:02.883086	0.014928	INSERT	MSSQL